Personal Computer World 2008 February

home *** CD-ROM | disk | FTP | other *** search

/ Personal Computer World 2008 February / PCWFEB08.iso / Software / Freeware / Miro 1.0 / Miro_Installer.exe / xulrunner / python / subscription.py < prev next >

Wrap

Python Source | 2007-11-12 | 5.7 KB | 176 lines

# Miro - an RSS based video player application # Copyright (C) 2005-2007 Participatory Culture Foundation # # This program is free software; you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation; either version 2 of the License, or # (at your option) any later version. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program; if not, write to the Free Software # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA import cgi import re import util import urllib2 import urlparse import xml.dom.minidom """ This place's waiting for a little bit of documentation """ # ========================================================================= reflexiveAutoDiscoveryOpener = urllib2.urlopen def parseFile(path): try: subscriptionFile = open(path, "r") content = subscriptionFile.read() subscriptionFile.close() return parseContent(content) except: pass def parseContent(content): try: dom = xml.dom.minidom.parseString(content) root = dom.documentElement if root.nodeName == "rss": urls = _getSubscriptionsFromRSSChannel(root) elif root.nodeName == "feed": urls = _getSubscriptionsFromAtomFeed(root) elif root.nodeName == "opml": urls = _getSubscriptionsFromOPMLOutline(root) else: urls = None dom.unlink() return urls except: import traceback if util.chatter: print "WARNING: Error parsing OPML content..." traceback.print_exc() return None def get_urls_from_query(query): urls = [] for key, value in cgi.parse_qs(query).items(): if re.match(r'url\d+$', key): urls.append(value[0]) return urls def findSubscribeLinks(url): """Given a URL, test if it's trying to subscribe the user using subscribe.getdemocracy.com. Returns the list of parsed URLs. """ try: scheme, host, path, params, query, frag = urlparse.urlparse(url) except: return 'none', [] if host not in ('subscribe.getdemocracy.com', 'subscribe.getmiro.com'): return 'none', [] if path in ('/', '/opml.php'): return 'feed', get_urls_from_query(query) elif path in ('/download.php','/download','/download/'): return 'download', get_urls_from_query(query) elif path in ('/channelguide.php', '/channelguide', '/channelguide/'): return 'guide', get_urls_from_query(query) else: return 'feed', [urllib2.unquote(path[1:])] # ========================================================================= def _getSubscriptionsFromRSSChannel(root): try: channel = root.getElementsByTagName("channel").pop() urls = _getSubscriptionsFromAtomLinkConstruct(channel) if urls is not None: return urls else: link = channel.getElementsByTagName("link").pop() href = link.firstChild.data return _getSubscriptionsFromReflexiveAutoDiscovery(href, "application/rss+xml") except: pass def _getSubscriptionsFromAtomFeed(root): try: urls = _getSubscriptionsFromAtomLinkConstruct(root) if urls is not None: return urls else: link = _getAtomLink(root) rel = link.getAttribute("rel") if rel == "alternate": href = link.getAttribute("href") return _getSubscriptionsFromReflexiveAutoDiscovery(href, "application/atom+xml") except: pass def _getSubscriptionsFromAtomLinkConstruct(node): try: link = _getAtomLink(node) if link.getAttribute("rel") in ("self", "start"): href = link.getAttribute("href") return [href] except: pass def _getSubscriptionsFromReflexiveAutoDiscovery(url, ltype): try: urls = list() html = reflexiveAutoDiscoveryOpener(url).read() for match in re.findall("<link[^>]+>", html): altMatch = re.search("rel=\"alternate\"", match) typeMatch = re.search("type=\"%s\"" % re.escape(ltype), match) hrefMatch = re.search("href=\"([^\"]*)\"", match) if None not in (altMatch, typeMatch, hrefMatch): href = hrefMatch.group(1) urls.append(href) except: urls = None else: if len(urls) == 0: urls = None return urls def _getAtomLink(node): return node.getElementsByTagNameNS("http://www.w3.org/2005/Atom", "link").pop() # ========================================================================= def _getSubscriptionsFromOPMLOutline(root): try: urls = list() body = root.getElementsByTagName("body").pop() _searchOPMLNodeRecursively(body, urls) except: urls = None else: if len(urls) == 0: urls = None return urls def _searchOPMLNodeRecursively(node, urls): try: children = node.childNodes for child in children: if hasattr(child, 'getAttribute'): if child.hasAttribute("xmlUrl"): url = child.getAttribute("xmlUrl") urls.append(url) else: _searchOPMLNodeRecursively(child, urls) except: pass # =========================================================================